#codeing:utf-8
import scrapy

from scrapy import Request
from shili.items import overseasItem

class OverseasSpider(scrapy.Spider):
    name="overseas"
    dllowed_domai = ['https://data.iresearch.com.cn/Home.shtml']
    start_url = ['https://index.iresearch.com.cn/overseas/']

    #列表页面进行解析
    def parse(self,respone):
        overseaslist =  respone.xpath('//div[class="list"]/table/tr')
        for scoll_list1 in overseaslist[1:1]:
               overseasItem1 = overseasItem()

               myid = scoll_list1.xpath('td[@class=cl11 ng-binding grees/text').extrafirst()
               overseasItem1['sourceid']=myid

        yield overseasItem1





